# -*- coding: utf-8 -*-
"""
Clusters por instituciones
"""
'\nClusters por instituciones\n'
%%HTML
<script src="require.js"></script>
# Importar librerías
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from matplotlib.pyplot import figure
import plotly.express as px
import seaborn as sns
import plotly.graph_objects as go
import plotly.io as pio
pio.renderers.default='notebook'
Cluster.infoInstituciones.csv https://drive.google.com/drive/u/0/folders/1APVnfD1zPgTHFAr0YMG6UMTwZ52MQVa9
Cluster.cluster.csv https://drive.google.com/file/d/16hq2o-oAD0chAqEgqEKn9Uu_dOitLPcj/view
from google.colab import drive
drive.mount('/content/drive/')
Mounted at /content/drive/
%cd /content/drive/My Drive/3BIO-Cluster-DataAnalysis
/content/drive/My Drive/3BIO-Cluster-DataAnalysis
%ls
Cluster.cluster.csv Cluster.infoGrupos.csv Cluster.infoInstituciones.csv
#Data
df = pd.read_csv("Cluster.infoInstituciones.csv")
df
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | trabajos_grado | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | A.I.D Biohacking Colombia Avalado | 1 | 2017.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 0.0 | ... | 0.0 | 6.0 | 1.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 1 | Aalborg University No Avalado | 1 | 2012.0 | 10.0 | 1.0 | 3.0 | 1.0 | 2.0 | 4.0 | 0.0 | ... | 13.0 | 13.0 | 7.0 | 1.0 | 0.0 | 3.0 | 0.0 | 0.0 | 1.0 | 0.0 |
| 2 | Abogato Jurídico S.A.S. Avalado | 1 | 2018.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 0.0 | 6.0 | 0.0 | 1.0 | 1.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 3 | Abya-Ayala No Avalado | 1 | 2014.0 | 9.0 | 0.0 | 0.0 | 2.0 | 7.0 | 0.0 | 0.0 | ... | 1.0 | 1.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 4 | Academia Américana De Psiquiatría No Avalado | 1 | 2008.0 | 5.0 | 0.0 | 0.0 | 0.0 | 0.0 | 12.0 | 0.0 | ... | 10.0 | 40.0 | 1.0 | 10.0 | 1.0 | 16.0 | 0.0 | 0.0 | 1.0 | 0.0 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 1437 | Washington State University No Avalado | 1 | 2010.0 | 31.0 | 11.0 | 2.0 | 0.0 | 1.0 | 7.0 | 0.0 | ... | 7.0 | 25.0 | 6.0 | 10.0 | 1.0 | 8.0 | 0.0 | 0.0 | 3.0 | 0.0 |
| 1438 | Yarima Guadua E. U. No Avalado | 1 | 2000.0 | 141.0 | 18.0 | 14.0 | 14.0 | 24.0 | 19.0 | 0.0 | ... | 131.0 | 62.0 | 10.0 | 22.0 | 3.0 | 20.0 | 0.0 | 0.0 | 6.0 | 3.0 |
| 1439 | Yoluka Ong, Fundación De Investigación En Biod... | 1 | 2008.0 | 25.0 | 2.0 | 4.0 | 7.0 | 2.0 | 18.0 | 0.0 | ... | 16.0 | 6.0 | 1.0 | 3.0 | 0.0 | 2.0 | 0.0 | 0.0 | 2.0 | 0.0 |
| 1440 | Zumo Tecnologia Avalado | 1 | 2013.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 11.0 | ... | 7.0 | 10.0 | 0.0 | 5.0 | 1.0 | 4.0 | 0.0 | 0.0 | 2.0 | 0.0 |
| 1441 | Zurich S.A. No Avalado | 1 | 2012.0 | 16.0 | 6.0 | 2.0 | 0.0 | 3.0 | 0.0 | 0.0 | ... | 2.0 | 2.0 | 1.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
1442 rows × 22 columns
dfi = pd.read_csv("Cluster.cluster.csv")
dfi
| Unnamed: 0 | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | libros | softwares | ... | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Instituciones | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | 0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 1.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | A.I.D Biohacking Colombia Avalado | 4 |
| 1 | 1 | 10.0 | 1.0 | 3.0 | 1.0 | 2.0 | 4.0 | 0.0 | 1.0 | 0.0 | ... | 7.0 | 1.0 | 0.0 | 3.0 | 0.0 | 0.0 | 1.0 | 0.0 | Aalborg University No Avalado | 4 |
| 2 | 2 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 0.0 | 1.0 | 1.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | Abogato Jurídico S.A.S. Avalado | 4 |
| 3 | 3 | 9.0 | 0.0 | 0.0 | 2.0 | 7.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | Abya-Ayala No Avalado | 4 |
| 4 | 4 | 5.0 | 0.0 | 0.0 | 0.0 | 0.0 | 12.0 | 0.0 | 0.0 | 1.0 | ... | 1.0 | 10.0 | 1.0 | 16.0 | 0.0 | 0.0 | 1.0 | 0.0 | Academia Américana De Psiquiatría No Avalado | 4 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 1437 | 1437 | 31.0 | 11.0 | 2.0 | 0.0 | 1.0 | 7.0 | 0.0 | 2.0 | 0.0 | ... | 6.0 | 10.0 | 1.0 | 8.0 | 0.0 | 0.0 | 3.0 | 0.0 | Washington State University No Avalado | 1 |
| 1438 | 1438 | 141.0 | 18.0 | 14.0 | 14.0 | 24.0 | 19.0 | 0.0 | 0.0 | 0.0 | ... | 10.0 | 22.0 | 3.0 | 20.0 | 0.0 | 0.0 | 6.0 | 3.0 | Yarima Guadua E. U. No Avalado | 3 |
| 1439 | 1439 | 25.0 | 2.0 | 4.0 | 7.0 | 2.0 | 18.0 | 0.0 | 0.0 | 0.0 | ... | 1.0 | 3.0 | 0.0 | 2.0 | 0.0 | 0.0 | 2.0 | 0.0 | Yoluka Ong, Fundación De Investigación En Biod... | 4 |
| 1440 | 1440 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 11.0 | 0.0 | 0.0 | ... | 0.0 | 5.0 | 1.0 | 4.0 | 0.0 | 0.0 | 2.0 | 0.0 | Zumo Tecnologia Avalado | 4 |
| 1441 | 1441 | 16.0 | 6.0 | 2.0 | 0.0 | 3.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 1.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | Zurich S.A. No Avalado | 4 |
1442 rows × 22 columns
clusters = dfi["Cluster"]
dfm = df.join(clusters) #append 'Cluster' to 'df'
dfm
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | A.I.D Biohacking Colombia Avalado | 1 | 2017.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 0.0 | ... | 6.0 | 1.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 1 | Aalborg University No Avalado | 1 | 2012.0 | 10.0 | 1.0 | 3.0 | 1.0 | 2.0 | 4.0 | 0.0 | ... | 13.0 | 7.0 | 1.0 | 0.0 | 3.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
| 2 | Abogato Jurídico S.A.S. Avalado | 1 | 2018.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 6.0 | 0.0 | 1.0 | 1.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 3 | Abya-Ayala No Avalado | 1 | 2014.0 | 9.0 | 0.0 | 0.0 | 2.0 | 7.0 | 0.0 | 0.0 | ... | 1.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 4 | Academia Américana De Psiquiatría No Avalado | 1 | 2008.0 | 5.0 | 0.0 | 0.0 | 0.0 | 0.0 | 12.0 | 0.0 | ... | 40.0 | 1.0 | 10.0 | 1.0 | 16.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 1437 | Washington State University No Avalado | 1 | 2010.0 | 31.0 | 11.0 | 2.0 | 0.0 | 1.0 | 7.0 | 0.0 | ... | 25.0 | 6.0 | 10.0 | 1.0 | 8.0 | 0.0 | 0.0 | 3.0 | 0.0 | 1 |
| 1438 | Yarima Guadua E. U. No Avalado | 1 | 2000.0 | 141.0 | 18.0 | 14.0 | 14.0 | 24.0 | 19.0 | 0.0 | ... | 62.0 | 10.0 | 22.0 | 3.0 | 20.0 | 0.0 | 0.0 | 6.0 | 3.0 | 3 |
| 1439 | Yoluka Ong, Fundación De Investigación En Biod... | 1 | 2008.0 | 25.0 | 2.0 | 4.0 | 7.0 | 2.0 | 18.0 | 0.0 | ... | 6.0 | 1.0 | 3.0 | 0.0 | 2.0 | 0.0 | 0.0 | 2.0 | 0.0 | 4 |
| 1440 | Zumo Tecnologia Avalado | 1 | 2013.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 11.0 | ... | 10.0 | 0.0 | 5.0 | 1.0 | 4.0 | 0.0 | 0.0 | 2.0 | 0.0 | 4 |
| 1441 | Zurich S.A. No Avalado | 1 | 2012.0 | 16.0 | 6.0 | 2.0 | 0.0 | 3.0 | 0.0 | 0.0 | ... | 2.0 | 1.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
1442 rows × 23 columns
dfm.head(5)
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | A.I.D Biohacking Colombia Avalado | 1 | 2017.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 0.0 | ... | 6.0 | 1.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 1 | Aalborg University No Avalado | 1 | 2012.0 | 10.0 | 1.0 | 3.0 | 1.0 | 2.0 | 4.0 | 0.0 | ... | 13.0 | 7.0 | 1.0 | 0.0 | 3.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
| 2 | Abogato Jurídico S.A.S. Avalado | 1 | 2018.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 6.0 | 0.0 | 1.0 | 1.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 3 | Abya-Ayala No Avalado | 1 | 2014.0 | 9.0 | 0.0 | 0.0 | 2.0 | 7.0 | 0.0 | 0.0 | ... | 1.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 4 | Academia Américana De Psiquiatría No Avalado | 1 | 2008.0 | 5.0 | 0.0 | 0.0 | 0.0 | 0.0 | 12.0 | 0.0 | ... | 40.0 | 1.0 | 10.0 | 1.0 | 16.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
5 rows × 23 columns
dfm.tail(5)
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1437 | Washington State University No Avalado | 1 | 2010.0 | 31.0 | 11.0 | 2.0 | 0.0 | 1.0 | 7.0 | 0.0 | ... | 25.0 | 6.0 | 10.0 | 1.0 | 8.0 | 0.0 | 0.0 | 3.0 | 0.0 | 1 |
| 1438 | Yarima Guadua E. U. No Avalado | 1 | 2000.0 | 141.0 | 18.0 | 14.0 | 14.0 | 24.0 | 19.0 | 0.0 | ... | 62.0 | 10.0 | 22.0 | 3.0 | 20.0 | 0.0 | 0.0 | 6.0 | 3.0 | 3 |
| 1439 | Yoluka Ong, Fundación De Investigación En Biod... | 1 | 2008.0 | 25.0 | 2.0 | 4.0 | 7.0 | 2.0 | 18.0 | 0.0 | ... | 6.0 | 1.0 | 3.0 | 0.0 | 2.0 | 0.0 | 0.0 | 2.0 | 0.0 | 4 |
| 1440 | Zumo Tecnologia Avalado | 1 | 2013.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 11.0 | ... | 10.0 | 0.0 | 5.0 | 1.0 | 4.0 | 0.0 | 0.0 | 2.0 | 0.0 | 4 |
| 1441 | Zurich S.A. No Avalado | 1 | 2012.0 | 16.0 | 6.0 | 2.0 | 0.0 | 3.0 | 0.0 | 0.0 | ... | 2.0 | 1.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
5 rows × 23 columns
dfm = dfm.sort_values(by=['articulos'], ascending=False)
dfsm = dfm.head(10)
fig = px.pie(dfsm, values='articulos', names='Instituciones')
fig.show()
fig = px.box(dfsm, y=['articulos','capitulos','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(dfsm, y=['articulos','capitulos','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(dfsm, y=['innovaciones', 'libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(dfsm, y=['innovaciones', 'libros', 'softwares'], points="all",color='Instituciones')
fig.show()
dfsm
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1378 | Universidad Nacional De Colombia Avalado | 621 | 2003.383253 | 50978.0 | 10304.0 | 5687.0 | 6429.0 | 4353.0 | 13554.0 | 526.0 | ... | 19521.0 | 4836.0 | 6238.0 | 620.0 | 3997.0 | 354.0 | 55.0 | 1007.0 | 508.0 | 1 |
| 1251 | Universidad De Antioquia Avalado | 262 | 2001.950382 | 27456.0 | 5957.0 | 3102.0 | 2955.0 | 2251.0 | 6737.0 | 290.0 | ... | 10198.0 | 2318.0 | 2735.0 | 381.0 | 2455.0 | 157.0 | 25.0 | 500.0 | 244.0 | 1 |
| 1287 | Universidad De Los Andes Avalado | 159 | 2002.893082 | 15636.0 | 5813.0 | 1945.0 | 1140.0 | 956.0 | 5545.0 | 105.0 | ... | 3833.0 | 1489.0 | 1158.0 | 81.0 | 487.0 | 107.0 | 20.0 | 246.0 | 160.0 | 1 |
| 1331 | Universidad Del Valle Avalado | 190 | 2001.926316 | 13215.0 | 2467.0 | 1502.0 | 1623.0 | 930.0 | 2743.0 | 137.0 | ... | 4555.0 | 1459.0 | 1233.0 | 121.0 | 896.0 | 120.0 | 24.0 | 344.0 | 127.0 | 1 |
| 1070 | Pontificia Universidad Javeriana Avalado | 112 | 2001.553571 | 12520.0 | 2118.0 | 1110.0 | 1257.0 | 1116.0 | 4791.0 | 127.0 | ... | 3074.0 | 1023.0 | 981.0 | 97.0 | 433.0 | 117.0 | 8.0 | 231.0 | 113.0 | 1 |
| 1353 | Universidad Industrial De Santander Avalado | 91 | 2001.131868 | 9872.0 | 1870.0 | 975.0 | 1444.0 | 674.0 | 1136.0 | 429.0 | ... | 4501.0 | 826.0 | 1297.0 | 152.0 | 1143.0 | 88.0 | 3.0 | 187.0 | 94.0 | 1 |
| 1333 | Universidad Distrital Francisco José De Caldas... | 124 | 2003.612903 | 9124.0 | 724.0 | 851.0 | 989.0 | 682.0 | 2354.0 | 66.0 | ... | 2988.0 | 726.0 | 889.0 | 122.0 | 601.0 | 77.0 | 2.0 | 168.0 | 36.0 | 1 |
| 1383 | Universidad Pedagógica Y Tecnológica De Colomb... | 155 | 2005.296774 | 8575.0 | 698.0 | 547.0 | 973.0 | 495.0 | 2754.0 | 285.0 | ... | 6851.0 | 940.0 | 1603.0 | 333.0 | 1951.0 | 74.0 | 7.0 | 252.0 | 33.0 | 1 |
| 1416 | Universidad Tecnológica De Pereira Avalado | 117 | 2005.136752 | 7950.0 | 994.0 | 628.0 | 693.0 | 402.0 | 1456.0 | 150.0 | ... | 3644.0 | 616.0 | 1020.0 | 121.0 | 884.0 | 57.0 | 0.0 | 158.0 | 56.0 | 1 |
| 1261 | Universidad De Cartagena Avalado | 99 | 2005.939394 | 7591.0 | 1113.0 | 609.0 | 1129.0 | 787.0 | 1315.0 | 103.0 | ... | 3228.0 | 464.0 | 535.0 | 151.0 | 964.0 | 44.0 | 2.0 | 153.0 | 52.0 | 1 |
10 rows × 23 columns
fig = px.bar(dfsm, y="Instituciones", x= ['SJR_Q_Q1','SJR_Q_Q2','SJR_Q_Q3','SJR_Q_Q4'], title="Clasificacion Articulos en SJR Q",text_auto= True,labels={'x':'Clusters','y':'Articulos'},color_discrete_map={'SJR_Q_Q4':'green'})
fig.update_yaxes(type='category', categoryorder= 'total ascending')
fig.show()
fig = px.pie(dfm.groupby('Cluster').size().reset_index(), values=0, names='Cluster', title="Participación de Clusters")
fig.show()
generacion = dfm.groupby('Cluster').sum().reset_index()[['Cluster','articulos','capitulos', 'innovaciones', 'libros', 'softwares']]
generacion[['articulos','capitulos', 'innovaciones', 'libros', 'softwares']]=generacion[['articulos','capitulos', 'innovaciones', 'libros', 'softwares']].div(generacion[['articulos','capitulos', 'innovaciones', 'libros', 'softwares']].sum(axis=1), axis=0).round(4) * 100
generacion
| Cluster | articulos | capitulos | innovaciones | libros | softwares | |
|---|---|---|---|---|---|---|
| 0 | 0 | 85.41 | 13.80 | 0.36 | 0.22 | 0.21 |
| 1 | 1 | 71.60 | 22.62 | 2.17 | 0.73 | 2.88 |
| 2 | 2 | 61.73 | 27.51 | 5.16 | 0.77 | 4.83 |
| 3 | 3 | 65.13 | 22.22 | 6.78 | 0.94 | 4.92 |
| 4 | 4 | 62.36 | 28.34 | 5.65 | 0.80 | 2.85 |
instit = dfm.groupby('Cluster').sum().reset_index()[['Cluster','trabajos_grado', 'integrantes', 'doctorado', 'maestria','Especializacion', 'pregrado']]
instit[['trabajos_grado', 'integrantes', 'doctorado', 'maestria','Especializacion', 'pregrado']]=instit[['trabajos_grado', 'integrantes', 'doctorado', 'maestria','Especializacion', 'pregrado']].div(instit[['trabajos_grado', 'integrantes', 'doctorado', 'maestria','Especializacion', 'pregrado']].sum(axis=1), axis=0).round(4) * 100
instit
| Cluster | trabajos_grado | integrantes | doctorado | maestria | Especializacion | pregrado | |
|---|---|---|---|---|---|---|---|
| 0 | 0 | 47.36 | 30.14 | 5.90 | 7.88 | 2.47 | 6.24 |
| 1 | 1 | 67.06 | 18.61 | 4.02 | 5.71 | 1.01 | 3.60 |
| 2 | 2 | 67.05 | 17.90 | 4.82 | 6.38 | 1.00 | 2.86 |
| 3 | 3 | 40.01 | 35.20 | 2.61 | 9.48 | 5.15 | 7.56 |
| 4 | 4 | 62.93 | 21.65 | 3.04 | 6.69 | 1.90 | 3.78 |
fig = px.box(dfm, y=['articulos','capitulos','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(dfm, y=['articulos','capitulos','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(dfm, y=['innovaciones', 'libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(dfm, y=['innovaciones', 'libros', 'softwares'], points="all",color='Instituciones')
fig.show()
dfm = dfm.sort_values(by=['Cluster'], ascending=False)
dfm
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1176 | Team Ingenieria De Conocimiento Ltda Avalado | 2 | 2002.000000 | 34.0 | 2.0 | 1.0 | 1.0 | 3.0 | 11.0 | 13.0 | ... | 42.0 | 6.0 | 9.0 | 5.0 | 16.0 | 1.0 | 0.0 | 1.0 | 0.0 | 4 |
| 957 | Instituto Tecnológico Del Putumayo - Itp Avalado | 2 | 2000.000000 | 14.0 | 3.0 | 0.0 | 6.0 | 1.0 | 3.0 | 0.0 | ... | 60.0 | 2.0 | 12.0 | 7.0 | 12.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 56 | Asociacion De Profesionales Para La Investigac... | 1 | 2017.000000 | 14.0 | 4.0 | 0.0 | 4.0 | 1.0 | 1.0 | 0.0 | ... | 7.0 | 3.0 | 3.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4.0 | 0.0 | 4 |
| 1048 | Open Innovation Lab Sas Avalado | 1 | 2006.000000 | 14.0 | 0.0 | 0.0 | 0.0 | 1.0 | 51.0 | 0.0 | ... | 23.0 | 6.0 | 9.0 | 0.0 | 5.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
| 12 | Administrative Management Consultants Sas Avalado | 2 | 2013.500000 | 14.0 | 0.0 | 0.0 | 9.0 | 1.0 | 31.0 | 0.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 1143 | Sociedad Colombiana De Ciencias Hortícolas No ... | 1 | 1999.000000 | 480.0 | 70.0 | 43.0 | 63.0 | 75.0 | 134.0 | 1.0 | ... | 64.0 | 27.0 | 16.0 | 1.0 | 13.0 | 3.0 | 1.0 | 2.0 | 5.0 | 0 |
| 633 | Fundacion Valle Del Lili Avalado | 3 | 2005.333333 | 1523.0 | 452.0 | 269.0 | 284.0 | 198.0 | 94.0 | 3.0 | ... | 198.0 | 13.0 | 48.0 | 24.0 | 29.0 | 3.0 | 0.0 | 7.0 | 2.0 | 0 |
| 916 | Instituto De Investigación De Recursos Biológi... | 1 | 2010.000000 | 442.0 | 189.0 | 58.0 | 53.0 | 27.0 | 629.0 | 0.0 | ... | 158.0 | 30.0 | 70.0 | 8.0 | 39.0 | 2.0 | 0.0 | 15.0 | 1.0 | 0 |
| 332 | Corporación Centro Internacional De Entrenamie... | 1 | 1990.000000 | 455.0 | 229.0 | 44.0 | 68.0 | 7.0 | 11.0 | 0.0 | ... | 131.0 | 27.0 | 29.0 | 4.0 | 62.0 | 1.0 | 1.0 | 6.0 | 1.0 | 0 |
| 197 | Centro Internacional Para Prueba De Vacunas Y ... | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
1442 rows × 23 columns
#Pivot table
dups = dfm.pivot_table(index = ['Cluster'], aggfunc ='size')
dups
Cluster 0 12 1 479 2 67 3 136 4 748 dtype: int64
dups = dups.sort_values(ascending=False)
dups
Cluster 4 748 1 479 3 136 2 67 0 12 dtype: int64
dups
Cluster 4 748 1 479 3 136 2 67 0 12 dtype: int64
df1 = dfm[dfm.Cluster == 1]
df1
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 639 | Fundación Cardioinfantil-Instituto De Cardiolo... | 2 | 2010.000000 | 366.0 | 38.0 | 22.0 | 19.0 | 95.0 | 22.0 | 0.0 | ... | 57.0 | 2.0 | 3.0 | 2.0 | 28.0 | 0.0 | 0.0 | 1.0 | 1.0 | 1 |
| 1333 | Universidad Distrital Francisco José De Caldas... | 124 | 2003.612903 | 9124.0 | 724.0 | 851.0 | 989.0 | 682.0 | 2354.0 | 66.0 | ... | 2988.0 | 726.0 | 889.0 | 122.0 | 601.0 | 77.0 | 2.0 | 168.0 | 36.0 | 1 |
| 1353 | Universidad Industrial De Santander Avalado | 91 | 2001.131868 | 9872.0 | 1870.0 | 975.0 | 1444.0 | 674.0 | 1136.0 | 429.0 | ... | 4501.0 | 826.0 | 1297.0 | 152.0 | 1143.0 | 88.0 | 3.0 | 187.0 | 94.0 | 1 |
| 729 | Fundación Universitaria Agraria De Colombia Av... | 12 | 2008.000000 | 277.0 | 56.0 | 39.0 | 60.0 | 14.0 | 152.0 | 8.0 | ... | 245.0 | 61.0 | 118.0 | 17.0 | 21.0 | 7.0 | 0.0 | 18.0 | 0.0 | 1 |
| 1391 | Universidad Pontificia Bolivariana Seccional M... | 8 | 2006.375000 | 286.0 | 66.0 | 47.0 | 34.0 | 20.0 | 194.0 | 1.0 | ... | 158.0 | 34.0 | 70.0 | 16.0 | 22.0 | 8.0 | 0.0 | 19.0 | 2.0 | 1 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 238 | Clínica Respiratoria Y De Alergias No Avalado | 1 | 1995.000000 | 109.0 | 14.0 | 6.0 | 12.0 | 13.0 | 35.0 | 0.0 | ... | 42.0 | 0.0 | 0.0 | 1.0 | 4.0 | 2.0 | 0.0 | 1.0 | 0.0 | 1 |
| 1378 | Universidad Nacional De Colombia Avalado | 621 | 2003.383253 | 50978.0 | 10304.0 | 5687.0 | 6429.0 | 4353.0 | 13554.0 | 526.0 | ... | 19521.0 | 4836.0 | 6238.0 | 620.0 | 3997.0 | 354.0 | 55.0 | 1007.0 | 508.0 | 1 |
| 510 | Escuela Latinoamericana De Ingenieros Tecnólog... | 3 | 2012.333333 | 111.0 | 3.0 | 6.0 | 15.0 | 9.0 | 110.0 | 1.0 | ... | 102.0 | 20.0 | 54.0 | 11.0 | 5.0 | 3.0 | 0.0 | 6.0 | 0.0 | 1 |
| 44 | Arkebios Sas No Avalado | 2 | 2001.000000 | 112.0 | 14.0 | 6.0 | 8.0 | 0.0 | 54.0 | 22.0 | ... | 88.0 | 18.0 | 30.0 | 8.0 | 14.0 | 2.0 | 0.0 | 4.0 | 0.0 | 1 |
| 191 | Centro Industrial Y De Energías Alternativas -... | 1 | 2011.000000 | 14.0 | 0.0 | 0.0 | 9.0 | 1.0 | 71.0 | 1.0 | ... | 30.0 | 4.0 | 13.0 | 7.0 | 5.0 | 1.0 | 0.0 | 3.0 | 0.0 | 1 |
479 rows × 23 columns
fig = px.box(df1, y=['articulos','capitulos','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(df1, y=['articulos','capitulos','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(df1, y=['innovaciones', 'libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(df1, y=['innovaciones', 'libros', 'softwares'], points="all",color='Instituciones')
fig.show()
df1 = df1.sort_values(by=['articulos'], ascending=False)
df1s = df1.head(10)
fig = px.pie(df1s, values='articulos', names='Instituciones')
fig.show()
df0 = dfm[dfm.Cluster == 0]
df0
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 452 | Dirección Seccional De Salud De Antioquia No A... | 1 | 1989.000000 | 413.0 | 86.0 | 30.0 | 74.0 | 23.0 | 52.0 | 11.0 | ... | 100.0 | 25.0 | 26.0 | 7.0 | 22.0 | 2.0 | 1.0 | 6.0 | 7.0 | 0 |
| 333 | Corporación Centro Internacional De Entrenamie... | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
| 686 | Fundación Instituto De Inmunología De Colombia... | 2 | 1995.500000 | 749.0 | 400.0 | 106.0 | 26.0 | 11.0 | 28.0 | 6.0 | ... | 252.0 | 89.0 | 68.0 | 10.0 | 58.0 | 5.0 | 1.0 | 32.0 | 8.0 | 0 |
| 345 | Corporación De Innovación Para El Desarrollo D... | 1 | 1986.000000 | 509.0 | 180.0 | 77.0 | 69.0 | 40.0 | 22.0 | 6.0 | ... | 109.0 | 27.0 | 28.0 | 4.0 | 33.0 | 1.0 | 1.0 | 5.0 | 4.0 | 0 |
| 1352 | Universidad Icesi No Avalado | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
| 84 | Asociación Hortifrutícola De Colombia - Asohof... | 1 | 1999.000000 | 480.0 | 70.0 | 43.0 | 63.0 | 75.0 | 134.0 | 1.0 | ... | 64.0 | 27.0 | 16.0 | 1.0 | 13.0 | 3.0 | 1.0 | 2.0 | 5.0 | 0 |
| 896 | Instituto Colombiano De Neuropedagogia No Avalado | 1 | 1995.000000 | 392.0 | 64.0 | 32.0 | 69.0 | 99.0 | 69.0 | 1.0 | ... | 57.0 | 18.0 | 24.0 | 6.0 | 5.0 | 5.0 | 0.0 | 1.0 | 6.0 | 0 |
| 1143 | Sociedad Colombiana De Ciencias Hortícolas No ... | 1 | 1999.000000 | 480.0 | 70.0 | 43.0 | 63.0 | 75.0 | 134.0 | 1.0 | ... | 64.0 | 27.0 | 16.0 | 1.0 | 13.0 | 3.0 | 1.0 | 2.0 | 5.0 | 0 |
| 633 | Fundacion Valle Del Lili Avalado | 3 | 2005.333333 | 1523.0 | 452.0 | 269.0 | 284.0 | 198.0 | 94.0 | 3.0 | ... | 198.0 | 13.0 | 48.0 | 24.0 | 29.0 | 3.0 | 0.0 | 7.0 | 2.0 | 0 |
| 916 | Instituto De Investigación De Recursos Biológi... | 1 | 2010.000000 | 442.0 | 189.0 | 58.0 | 53.0 | 27.0 | 629.0 | 0.0 | ... | 158.0 | 30.0 | 70.0 | 8.0 | 39.0 | 2.0 | 0.0 | 15.0 | 1.0 | 0 |
| 332 | Corporación Centro Internacional De Entrenamie... | 1 | 1990.000000 | 455.0 | 229.0 | 44.0 | 68.0 | 7.0 | 11.0 | 0.0 | ... | 131.0 | 27.0 | 29.0 | 4.0 | 62.0 | 1.0 | 1.0 | 6.0 | 1.0 | 0 |
| 197 | Centro Internacional Para Prueba De Vacunas Y ... | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
12 rows × 23 columns
fig = px.box(df0, y=['articulos','capitulos','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(df0, y=['articulos','capitulos','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(df0, y=['innovaciones', 'libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(df0, y=['innovaciones', 'libros', 'softwares'], points="all",color='Instituciones')
fig.show()
df0 = df0.sort_values(by=['articulos'], ascending=False)
df0h = df0.head()
df0h
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 633 | Fundacion Valle Del Lili Avalado | 3 | 2005.333333 | 1523.0 | 452.0 | 269.0 | 284.0 | 198.0 | 94.0 | 3.0 | ... | 198.0 | 13.0 | 48.0 | 24.0 | 29.0 | 3.0 | 0.0 | 7.0 | 2.0 | 0 |
| 333 | Corporación Centro Internacional De Entrenamie... | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
| 1352 | Universidad Icesi No Avalado | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
| 197 | Centro Internacional Para Prueba De Vacunas Y ... | 1 | 1997.000000 | 933.0 | 315.0 | 148.0 | 155.0 | 103.0 | 53.0 | 2.0 | ... | 155.0 | 10.0 | 31.0 | 22.0 | 19.0 | 3.0 | 0.0 | 5.0 | 1.0 | 0 |
| 686 | Fundación Instituto De Inmunología De Colombia... | 2 | 1995.500000 | 749.0 | 400.0 | 106.0 | 26.0 | 11.0 | 28.0 | 6.0 | ... | 252.0 | 89.0 | 68.0 | 10.0 | 58.0 | 5.0 | 1.0 | 32.0 | 8.0 | 0 |
5 rows × 23 columns
fig = px.pie(df0, values='articulos', names='Instituciones')
fig.show()
df2 = dfm[dfm.Cluster == 2]
df2
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 863 | Institución Educativa José María Córdob Avalado | 1 | 2010.000000 | 17.0 | 2.0 | 1.0 | 4.0 | 0.0 | 68.0 | 0.0 | ... | 70.0 | 20.0 | 29.0 | 4.0 | 4.0 | 4.0 | 0.0 | 11.0 | 2.0 | 2 |
| 833 | Icp- Instituto Colombiano De Petróleo No Avalado | 1 | 2014.000000 | 42.0 | 13.0 | 1.0 | 14.0 | 1.0 | 0.0 | 0.0 | ... | 47.0 | 13.0 | 28.0 | 1.0 | 2.0 | 4.0 | 0.0 | 3.0 | 1.0 | 2 |
| 185 | Centro De Investigación Y Desarrollo Tecnológi... | 2 | 1998.500000 | 101.0 | 37.0 | 12.0 | 10.0 | 9.0 | 22.0 | 5.0 | ... | 170.0 | 25.0 | 49.0 | 10.0 | 41.0 | 9.0 | 0.0 | 7.0 | 2.0 | 2 |
| 781 | Grupo Labservis Ltda No Avalado | 2 | 2003.500000 | 341.0 | 50.0 | 16.0 | 70.0 | 35.0 | 13.0 | 8.0 | ... | 102.0 | 35.0 | 36.0 | 1.0 | 24.0 | 4.0 | 0.0 | 10.0 | 3.0 | 2 |
| 678 | Fundación Hospital Universidad Del Norte Avalado | 1 | 2003.000000 | 119.0 | 55.0 | 26.0 | 10.0 | 9.0 | 18.0 | 0.0 | ... | 36.0 | 21.0 | 8.0 | 0.0 | 3.0 | 2.0 | 0.0 | 5.0 | 5.0 | 2 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 559 | Fundacion Canguro Avalado | 1 | 1989.000000 | 96.0 | 41.0 | 8.0 | 16.0 | 4.0 | 14.0 | 0.0 | ... | 46.0 | 10.0 | 11.0 | 7.0 | 13.0 | 3.0 | 1.0 | 0.0 | 2.0 | 2 |
| 727 | Fundación Universidad Del Norte Avalado | 42 | 2001.404762 | 5531.0 | 1152.0 | 650.0 | 604.0 | 502.0 | 1891.0 | 52.0 | ... | 1746.0 | 592.0 | 548.0 | 77.0 | 338.0 | 73.0 | 6.0 | 106.0 | 80.0 | 2 |
| 370 | Corporación Para El Desarrollo De La Biotecnol... | 2 | 1999.500000 | 64.0 | 4.0 | 4.0 | 5.0 | 6.0 | 9.0 | 7.0 | ... | 85.0 | 21.0 | 24.0 | 6.0 | 19.0 | 4.0 | 2.0 | 4.0 | 1.0 | 2 |
| 666 | Fundación General De Apoyo A La Universidad De... | 3 | 1997.000000 | 313.0 | 56.0 | 23.0 | 33.0 | 22.0 | 62.0 | 0.0 | ... | 111.0 | 42.0 | 34.0 | 2.0 | 17.0 | 6.0 | 0.0 | 10.0 | 4.0 | 2 |
| 429 | Corporación Vidarium, Centro De Investigación ... | 1 | 1999.000000 | 174.0 | 54.0 | 8.0 | 17.0 | 40.0 | 29.0 | 1.0 | ... | 95.0 | 10.0 | 43.0 | 5.0 | 19.0 | 2.0 | 0.0 | 2.0 | 4.0 | 2 |
67 rows × 23 columns
fig = px.box(df2, y=['articulos','capitulos','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(df2, y=['articulos','capitulos','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(df2, y=['innovaciones', 'libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(df2, y=['innovaciones', 'libros', 'softwares'], points="all",color='Instituciones')
fig.show()
df2 = df2.sort_values(by=['articulos'], ascending=False)
df2.head()
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 727 | Fundación Universidad Del Norte Avalado | 42 | 2001.404762 | 5531.0 | 1152.0 | 650.0 | 604.0 | 502.0 | 1891.0 | 52.0 | ... | 1746.0 | 592.0 | 548.0 | 77.0 | 338.0 | 73.0 | 6.0 | 106.0 | 80.0 | 2 |
| 1407 | Universidad Simón Bolívar Avalado | 44 | 2003.045455 | 4054.0 | 676.0 | 332.0 | 864.0 | 716.0 | 2185.0 | 415.0 | ... | 1588.0 | 402.0 | 543.0 | 105.0 | 278.0 | 117.0 | 8.0 | 121.0 | 72.0 | 2 |
| 1218 | Universidad Autonoma De Manizales Avalado | 15 | 2000.533333 | 1643.0 | 108.0 | 150.0 | 147.0 | 143.0 | 299.0 | 33.0 | ... | 892.0 | 215.0 | 339.0 | 53.0 | 157.0 | 36.0 | 3.0 | 61.0 | 23.0 | 2 |
| 622 | Fundacion Universitaria Konrad Lorenz Avalado | 4 | 2001.750000 | 608.0 | 145.0 | 136.0 | 140.0 | 51.0 | 217.0 | 0.0 | ... | 248.0 | 54.0 | 71.0 | 8.0 | 42.0 | 16.0 | 0.0 | 8.0 | 7.0 | 2 |
| 877 | Institución Universitaria Pascual Bravo Avalado | 5 | 2007.200000 | 406.0 | 81.0 | 109.0 | 63.0 | 37.0 | 84.0 | 32.0 | ... | 244.0 | 44.0 | 106.0 | 19.0 | 34.0 | 9.0 | 0.0 | 23.0 | 2.0 | 2 |
5 rows × 23 columns
df2 = df2.sort_values(by=['articulos'], ascending=False)
df2s = df2.head(10)
fig = px.pie(df2s, values='articulos', names='Instituciones')
fig.show()
df3 = dfm[dfm.Cluster == 3]
df3
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1106 | Scare/Fepasde No Avalado | 1 | 2008.0 | 79.0 | 3.0 | 2.0 | 14.0 | 8.0 | 23.0 | 0.0 | ... | 84.0 | 0.0 | 1.0 | 7.0 | 12.0 | 1.0 | 0.0 | 0.0 | 0.0 | 3 |
| 324 | Corporación Centro De Desarrollo Tecnologico D... | 1 | 2003.0 | 14.0 | 2.0 | 1.0 | 5.0 | 2.0 | 0.0 | 9.0 | ... | 67.0 | 2.0 | 5.0 | 14.0 | 35.0 | 0.0 | 0.0 | 0.0 | 0.0 | 3 |
| 695 | Fundación Logyca / Investigación Avalado | 1 | 2008.0 | 49.0 | 18.0 | 10.0 | 5.0 | 2.0 | 28.0 | 0.0 | ... | 58.0 | 10.0 | 16.0 | 6.0 | 20.0 | 0.0 | 0.0 | 0.0 | 0.0 | 3 |
| 977 | Jardín Botánico De Bogotá José Celestino Mutis... | 2 | 2008.5 | 119.0 | 10.0 | 11.0 | 20.0 | 17.0 | 51.0 | 1.0 | ... | 107.0 | 5.0 | 47.0 | 10.0 | 32.0 | 1.0 | 0.0 | 1.0 | 0.0 | 3 |
| 272 | Conservatorio Del Tolima Avalado | 1 | 2003.0 | 22.0 | 0.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | ... | 44.0 | 1.0 | 18.0 | 4.0 | 8.0 | 0.0 | 0.0 | 0.0 | 0.0 | 3 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 37 | Andina Diseñadores No Avalado | 1 | 2014.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 3.0 | 2.0 | ... | 53.0 | 1.0 | 11.0 | 9.0 | 12.0 | 0.0 | 0.0 | 2.0 | 0.0 | 3 |
| 118 | Caimed Sas Avalado | 1 | 2007.0 | 27.0 | 22.0 | 0.0 | 1.0 | 2.0 | 5.0 | 0.0 | ... | 43.0 | 7.0 | 7.0 | 9.0 | 9.0 | 0.0 | 0.0 | 1.0 | 1.0 | 3 |
| 503 | Escuela De Inteligencia Y Contrainteligencia B... | 2 | 2012.5 | 51.0 | 0.0 | 2.0 | 2.0 | 0.0 | 21.0 | 2.0 | ... | 110.0 | 7.0 | 29.0 | 6.0 | 23.0 | 0.0 | 0.0 | 2.0 | 0.0 | 3 |
| 17 | Agremiacion De Gineco-Obstetras De Cartagena Y... | 1 | 2007.0 | 235.0 | 55.0 | 32.0 | 18.0 | 17.0 | 50.0 | 1.0 | ... | 131.0 | 1.0 | 9.0 | 6.0 | 52.0 | 0.0 | 0.0 | 2.0 | 1.0 | 3 |
| 939 | Instituto Nacional De Metrologia - Inm Avalado | 2 | 2013.5 | 64.0 | 23.0 | 5.0 | 17.0 | 5.0 | 2.0 | 0.0 | ... | 86.0 | 3.0 | 31.0 | 10.0 | 28.0 | 0.0 | 0.0 | 2.0 | 0.0 | 3 |
136 rows × 23 columns
fig = px.box(df3, y=['articulos','capitulos','innovaciones','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(df3, y=['articulos','capitulos','innovaciones','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(df3, y=['libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(df3, y=['libros', 'softwares'], points="all",color='Instituciones')
fig.show()
df3 = df3.sort_values(by=['articulos'], ascending=False)
df3.head()
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1126 | Servicio Nacional De Aprendizaje Sena Avalado | 97 | 2012.412371 | 1045.0 | 103.0 | 70.0 | 160.0 | 75.0 | 829.0 | 163.0 | ... | 4773.0 | 214.0 | 1313.0 | 919.0 | 887.0 | 21.0 | 0.0 | 135.0 | 1.0 | 3 |
| 1399 | Universidad Santo Tomas Seccional Tunja Avalado | 10 | 2010.200000 | 783.0 | 28.0 | 16.0 | 31.0 | 26.0 | 269.0 | 43.0 | ... | 491.0 | 89.0 | 210.0 | 51.0 | 96.0 | 7.0 | 0.0 | 26.0 | 1.0 | 3 |
| 484 | Empresa Social Del Estado Hospital Universitar... | 4 | 2001.500000 | 567.0 | 79.0 | 48.0 | 113.0 | 47.0 | 123.0 | 0.0 | ... | 298.0 | 11.0 | 35.0 | 23.0 | 73.0 | 4.0 | 0.0 | 9.0 | 4.0 | 3 |
| 200 | Centro Medico Imbanaco De Cali S.A. Avalado | 2 | 2002.000000 | 403.0 | 55.0 | 27.0 | 54.0 | 72.0 | 29.0 | 2.0 | ... | 142.0 | 4.0 | 27.0 | 12.0 | 16.0 | 0.0 | 0.0 | 5.0 | 1.0 | 3 |
| 394 | Corporación Universidad Piloto De Colombia Ava... | 6 | 2002.666667 | 381.0 | 29.0 | 19.0 | 60.0 | 17.0 | 187.0 | 35.0 | ... | 395.0 | 58.0 | 172.0 | 46.0 | 60.0 | 5.0 | 0.0 | 20.0 | 0.0 | 3 |
5 rows × 23 columns
df3 = df3.sort_values(by=['articulos'], ascending=False)
df3s = df3.head(10)
fig = px.pie(df3s, values='articulos', names='Instituciones')
fig.show()
df4 = dfm[dfm.Cluster == 4]
df4
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1176 | Team Ingenieria De Conocimiento Ltda Avalado | 2 | 2002.0 | 34.0 | 2.0 | 1.0 | 1.0 | 3.0 | 11.0 | 13.0 | ... | 42.0 | 6.0 | 9.0 | 5.0 | 16.0 | 1.0 | 0.0 | 1.0 | 0.0 | 4 |
| 957 | Instituto Tecnológico Del Putumayo - Itp Avalado | 2 | 2000.0 | 14.0 | 3.0 | 0.0 | 6.0 | 1.0 | 3.0 | 0.0 | ... | 60.0 | 2.0 | 12.0 | 7.0 | 12.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 56 | Asociacion De Profesionales Para La Investigac... | 1 | 2017.0 | 14.0 | 4.0 | 0.0 | 4.0 | 1.0 | 1.0 | 0.0 | ... | 7.0 | 3.0 | 3.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4.0 | 0.0 | 4 |
| 1048 | Open Innovation Lab Sas Avalado | 1 | 2006.0 | 14.0 | 0.0 | 0.0 | 0.0 | 1.0 | 51.0 | 0.0 | ... | 23.0 | 6.0 | 9.0 | 0.0 | 5.0 | 0.0 | 0.0 | 1.0 | 0.0 | 4 |
| 12 | Administrative Management Consultants Sas Avalado | 2 | 2013.5 | 14.0 | 0.0 | 0.0 | 9.0 | 1.0 | 31.0 | 0.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 320 | Corporación Autónoma Regional Del Centro De An... | 1 | 2010.0 | 61.0 | 10.0 | 16.0 | 5.0 | 3.0 | 12.0 | 0.0 | ... | 5.0 | 0.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 487 | Empresas Públicas De Medellín E.S.P. No Avalado | 1 | 2010.0 | 61.0 | 10.0 | 16.0 | 5.0 | 3.0 | 12.0 | 0.0 | ... | 5.0 | 0.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
| 654 | Fundación Ciudad De Cali Para La Educación Y E... | 2 | 2008.5 | 54.0 | 0.0 | 1.0 | 0.0 | 2.0 | 39.0 | 0.0 | ... | 37.0 | 9.0 | 13.0 | 5.0 | 6.0 | 0.0 | 0.0 | 3.0 | 0.0 | 4 |
| 1254 | Universidad De Bayreuth No Avalado | 1 | 2008.0 | 57.0 | 30.0 | 17.0 | 6.0 | 3.0 | 1.0 | 0.0 | ... | 18.0 | 7.0 | 3.0 | 0.0 | 3.0 | 0.0 | 0.0 | 1.0 | 1.0 | 4 |
| 160 | Centro De Estudios En Protección Social Y Econ... | 1 | 2010.0 | 57.0 | 25.0 | 13.0 | 4.0 | 5.0 | 8.0 | 0.0 | ... | 16.0 | 1.0 | 9.0 | 0.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4 |
748 rows × 23 columns
fig = px.box(df4, y=['articulos','capitulos','innovaciones','trabajos_grado'], points="all", color="Cluster")
fig.show()
fig = px.box(df4, y=['articulos','capitulos','innovaciones','trabajos_grado'], points="all", color='Instituciones')
fig.show()
fig = px.box(df4, y=['libros', 'softwares'], points="all", color="Cluster")
fig.show()
fig = px.box(df4, y=['libros', 'softwares'], points="all",color='Instituciones')
fig.show()
df4 = df4.sort_values(by=['articulos'], ascending=False)
df4.head()
| Instituciones | grupo | year | articulos | SJR_Q_Q1 | SJR_Q_Q2 | SJR_Q_Q3 | SJR_Q_Q4 | capitulos | innovaciones | ... | integrantes | doctorado | maestria | Especializacion | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | Cluster | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1279 | Universidad De La Guajira Avalado | 55 | 2009.236364 | 1310.0 | 75.0 | 81.0 | 307.0 | 157.0 | 1286.0 | 47.0 | ... | 969.0 | 222.0 | 348.0 | 56.0 | 153.0 | 23.0 | 0.0 | 97.0 | 7.0 | 4 |
| 810 | Hospital Militar Central Avalado | 17 | 2009.352941 | 811.0 | 151.0 | 104.0 | 67.0 | 113.0 | 61.0 | 0.0 | ... | 492.0 | 19.0 | 53.0 | 55.0 | 74.0 | 7.0 | 0.0 | 16.0 | 2.0 | 4 |
| 1245 | Universidad Colegio Mayor De Cundinamarca Avalado | 24 | 2006.291667 | 769.0 | 86.0 | 53.0 | 67.0 | 52.0 | 491.0 | 27.0 | ... | 366.0 | 37.0 | 124.0 | 32.0 | 69.0 | 5.0 | 0.0 | 19.0 | 0.0 | 4 |
| 928 | Instituto Nacional De Cancerologia Ese Avalado | 8 | 2010.250000 | 740.0 | 127.0 | 44.0 | 91.0 | 78.0 | 35.0 | 0.0 | ... | 122.0 | 10.0 | 34.0 | 15.0 | 11.0 | 0.0 | 0.0 | 10.0 | 0.0 | 4 |
| 223 | Clínica Ces Avalado | 6 | 2006.000000 | 682.0 | 98.0 | 50.0 | 42.0 | 200.0 | 176.0 | 1.0 | ... | 118.0 | 3.0 | 23.0 | 18.0 | 19.0 | 0.0 | 0.0 | 4.0 | 5.0 | 4 |
5 rows × 23 columns
df4 = df4.sort_values(by=['articulos'], ascending=False)
df4s = df4.head(10)
fig = px.pie(df4s, values='articulos', names='Instituciones')
fig.show()
df.columns
Index(['Instituciones', 'grupo', 'year', 'articulos', 'SJR_Q_Q1', 'SJR_Q_Q2',
'SJR_Q_Q3', 'SJR_Q_Q4', 'capitulos', 'innovaciones', 'libros',
'softwares', 'trabajos_grado', 'integrantes', 'doctorado', 'maestria',
'Especializacion', 'pregrado', 'Investigador_Asociado',
'Investigador_Emerito', 'Investigador_Junior', 'Investigador Senior'],
dtype='object')
#Pivot table
dups = df.pivot_table(index = ['grupo'], aggfunc ='size')
dups
grupo
0 3
1 937
2 167
3 60
4 41
...
155 1
159 1
190 1
262 1
621 1
Length: 68, dtype: int64
dups = dups.sort_values(ascending=False)
dups
grupo
1 937
2 167
3 60
4 41
5 23
...
48 1
44 1
40 1
32 1
621 1
Length: 68, dtype: int64
ax = dups.plot.kde()
plot = dups.plot.pie(y='grupo', figsize=(5, 5), )
Cluster.infoGrupos.csv https://drive.google.com/drive/u/0/folders/1APVnfD1zPgTHFAr0YMG6UMTwZ52MQVa9
dfg = pd.read_csv("Cluster.infoGrupos.csv")
dfg
| Codigo del grupo | Nombre grupo | Lider | Avalado | Estado | Clasificado en | link_grupos | link_perfiles | Instituciones | fecha_creacion | ... | trabajos_grado | integrantes | doctorado | Especializacion | maestria | pregrado | Investigador_Asociado | Investigador_Emerito | Investigador_Junior | Investigador Senior | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | COL0024623 | Biotecnologia vegetal | Giovanni Orlando Cancino Escalante | 1 de 1 | Categoría C | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Universidad De Pamplona Avalado | Febrero de 2003. | ... | 38.0 | 47.0 | 16.0 | 1.0 | 15.0 | 10.0 | 4.0 | 0.0 | 7.0 | 0.0 |
| 1 | COL0137494 | Grupo de investigación en agricultura biológica | Lucia Ana Diaz Ariza | 1 de 2 | Categoría C | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Pontificia Universidad Javeriana Avalado | Octubre de 2011. | ... | 54.0 | 24.0 | 7.0 | 0.0 | 13.0 | 1.0 | 1.0 | 0.0 | 1.0 | 1.0 |
| 2 | COL0102962 | Rg microbial ecology: metabolism, genomics & e... | Howard Junca Diaz | 3 de 5 | Grupo reconocido | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Corporación Corpogen No Avalado | Enero de 2010. | ... | 5.0 | 6.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 3.0 | 0.0 |
| 3 | COL0102962 | Rg microbial ecology: metabolism, genomics & e... | Howard Junca Diaz | 3 de 5 | Grupo reconocido | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Asociacion Fundacion De Investigacion Microbio... | Enero de 2010. | ... | 5.0 | 6.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 3.0 | 0.0 |
| 4 | COL0102962 | Rg microbial ecology: metabolism, genomics & e... | Howard Junca Diaz | 3 de 5 | Grupo reconocido | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Compañia Campo Colombia Avalado | Enero de 2010. | ... | 5.0 | 6.0 | 4.0 | 0.0 | 0.0 | 1.0 | 1.0 | 0.0 | 3.0 | 0.0 |
| ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
| 7886 | COL0155269 | Grupo de investigación socio jurídico - gisoju | NaN | 3 de 6 | Categoría C | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Universidad Francisco De Paula Santander Ocaña... | Mayo de 2014. | ... | 34.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 7887 | COL0187772 | Parrhesía, grupo de investigación en filosofía... | NaN | 1 de 1 | Categoría C | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Universitaria Agustiniana Avalado | Diciembre de 2014. | ... | 33.0 | 7.0 | 2.0 | 0.0 | 4.0 | 1.0 | 0.0 | 0.0 | 1.0 | 0.0 |
| 7888 | COL0155699 | Trabajo social, derechos humanos y desarrollo ... | NaN | 1 de 2 | Grupo reconocido | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Corporacion Universitaria Rafael Nuñez Avalado | Enero de 2013. | ... | 19.0 | 6.0 | 0.0 | 0.0 | 5.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 7889 | COL0205253 | Investigación e innovación para la educación, ... | NaN | 1 de 2 | Categoría C | Convocatoria 833 de 2018 | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Organizacion De Estados Iberoamericanos Oei Av... | Enero de 2015. | ... | 18.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| 7890 | COL0211751 | Grupo de estudios creativos de la universidad ... | NaN | 1 de 2 | Categoría 00 | Sin Reconocer | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | Colegio Mayor Nuestra Señora Del Rosario Avalado | Diciembre de 2019. | ... | 0.0 | 4.0 | 1.0 | 0.0 | 3.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
7891 rows × 33 columns
dfg.columns
Index(['Codigo del grupo', 'Nombre grupo', 'Lider', 'Avalado', 'Estado',
'Clasificado en', 'link_grupos', 'link_perfiles', 'Instituciones',
'fecha_creacion', 'lugar_creacion', 'year', 'grupo', 'articulos',
'SJR_Q_Q1', 'SJR_Q_Q2', 'SJR_Q_Q3', 'SJR_Q_Q4', 'SJR_Q_Sin categoria',
'capitulos', 'innovaciones', 'libros', 'softwares', 'trabajos_grado',
'integrantes', 'doctorado', 'Especializacion', 'maestria', 'pregrado',
'Investigador_Asociado', 'Investigador_Emerito', 'Investigador_Junior',
'Investigador Senior'],
dtype='object')
dfg.T
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | ... | 7881 | 7882 | 7883 | 7884 | 7885 | 7886 | 7887 | 7888 | 7889 | 7890 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| Codigo del grupo | COL0024623 | COL0137494 | COL0102962 | COL0102962 | COL0102962 | COL0007829 | COL0031449 | COL0029138 | COL0001029 | COL0008871 | ... | COL0052252 | COL0188072 | COL0105347 | COL0185169 | COL0178915 | COL0155269 | COL0187772 | COL0155699 | COL0205253 | COL0211751 |
| Nombre grupo | Biotecnologia vegetal | Grupo de investigación en agricultura biológica | Rg microbial ecology: metabolism, genomics & e... | Rg microbial ecology: metabolism, genomics & e... | Rg microbial ecology: metabolism, genomics & e... | Grupo de biotecnología-productos naturales | Alimentos y agroindustria | Sistemas agrícolas del trópico (sat) | Bioprocesos y bioprospección | Grupo de investigaciones en ingenieria biomédi... | ... | Grupo de investigación en diseńo, imagen y com... | Grupo de investigación ceinfes | Grupo de investigaciones empresariales (grinem) | Estudios y análisis del espacio público | Diseńo y comunicación audiovisual | Grupo de investigación socio jurídico - gisoju | Parrhesía, grupo de investigación en filosofía... | Trabajo social, derechos humanos y desarrollo ... | Investigación e innovación para la educación, ... | Grupo de estudios creativos de la universidad ... |
| Lider | Giovanni Orlando Cancino Escalante | Lucia Ana Diaz Ariza | Howard Junca Diaz | Howard Junca Diaz | Howard Junca Diaz | Oscar Marino Mosquera Martinez | Oscar Julian Sanchez Toro | Angela Arcila Cardona | Dolly Montoya Castano | Clara Eugenia Goyes Lopez | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
| Avalado | 1 de 1 | 1 de 2 | 3 de 5 | 3 de 5 | 3 de 5 | 1 de 1 | 1 de 1 | 1 de 1 | 1 de 1 | 1 de 1 | ... | 1 de 1 | 1 de 1 | 2 de 3 | 1 de 1 | 1 de 1 | 3 de 6 | 1 de 1 | 1 de 2 | 1 de 2 | 1 de 2 |
| Estado | Categoría C | Categoría C | Grupo reconocido | Grupo reconocido | Grupo reconocido | Categoría B | Categoría A1 | Categoría A1 | Categoría A | Categoría A | ... | Categoría B | Categoría C | Categoría 00 | Categoría C | Categoría C | Categoría C | Categoría C | Grupo reconocido | Categoría C | Categoría 00 |
| Clasificado en | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | ... | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Convocatoria 833 de 2018 | Sin Reconocer |
| link_grupos | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | ... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... |
| link_perfiles | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | ... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... | https://scienti.minciencias.gov.co/gruplac/jsp... |
| Instituciones | Universidad De Pamplona Avalado | Pontificia Universidad Javeriana Avalado | Corporación Corpogen No Avalado | Asociacion Fundacion De Investigacion Microbio... | Compañia Campo Colombia Avalado | Universidad Tecnológica De Pereira Avalado | Universidad De Caldas Avalado | Corporación Colombiana De Investigación Agrope... | Universidad Nacional De Colombia Avalado | Universidad Autonoma De Occidente Avalado | ... | Corporación Universidad De Investigación Y Des... | Centro De Investigación Y Formación Para La Ed... | Institución Univesitaria Latina Avalado | Departamento Administrativo Defensoría Del Esp... | Taller Cinco Centro De Diseño Avalado | Universidad Francisco De Paula Santander Ocaña... | Universitaria Agustiniana Avalado | Corporacion Universitaria Rafael Nuñez Avalado | Organizacion De Estados Iberoamericanos Oei Av... | Colegio Mayor Nuestra Señora Del Rosario Avalado |
| fecha_creacion | Febrero de 2003. | Octubre de 2011. | Enero de 2010. | Enero de 2010. | Enero de 2010. | Enero de 1996. | Enero de 2002. | Septiembre de 2004. | Febrero de 1995. | Enero de 2000. | ... | Septiembre de 2004. | Enero de 2017. | Abril de 2010. | Enero de 2016. | Enero de 2016. | Mayo de 2014. | Diciembre de 2014. | Enero de 2013. | Enero de 2015. | Diciembre de 2019. |
| lugar_creacion | PAMPLONA / NORTE DE SANTANDER / Centro -... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | CHÍA / CUNDINAMARCA / Centro - Oriente ... | CHÍA / CUNDINAMARCA / Centro - Oriente ... | CHÍA / CUNDINAMARCA / Centro - Oriente ... | PEREIRA / RISARALDA / Región Eje Cafeter... | MANIZALES / CALDAS / Región Eje Cafetero... | MOSQUERA / CUNDINAMARCA / Centro - Orien... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | CALI / VALLE DEL CAUCA / Región Pacífico... | ... | BUCARAMANGA / SANTANDER / Centro - Orien... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | CHÍA / CUNDINAMARCA / Centro - Oriente ... | OCAÑA / NORTE DE SANTANDER / Centro - Or... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | CARTAGENA DE INDIAS / BOLÍVAR / Región C... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... | BOGOTÁ, D.C. / BOGOTÁ, D. C. / Distrito ... |
| year | 2003 | 2011 | 2010 | 2010 | 2010 | 1996 | 2002 | 2004 | 1995 | 2000 | ... | 2004 | 2017 | 2010 | 2016 | 2016 | 2014 | 2014 | 2013 | 2015 | 2019 |
| grupo | Biotecnologia vegetal | Grupo de investigación en agricultura biológica | Rg microbial ecology: metabolism, genomics & e... | Rg microbial ecology: metabolism, genomics & e... | Rg microbial ecology: metabolism, genomics & e... | Grupo de biotecnología-productos naturales | Alimentos y agroindustria | Sistemas agrícolas del trópico (sat) | Bioprocesos y bioprospección | Grupo de investigaciones en ingenieria biomédi... | ... | Grupo de investigación en diseńo, imagen y com... | Grupo de investigación ceinfes | Grupo de investigaciones empresariales (grinem) | Estudios y análisis del espacio público | Diseńo y comunicación audiovisual | Grupo de investigación socio jurídico - gisoju | Parrhesía, grupo de investigación en filosofía... | Trabajo social, derechos humanos y desarrollo ... | Investigación e innovación para la educación, ... | Grupo de estudios creativos de la universidad ... |
| articulos | 35.0 | 18.0 | 30.0 | 30.0 | 30.0 | 59.0 | 162.0 | 203.0 | 110.0 | 49.0 | ... | 15.0 | 8.0 | 0.0 | 6.0 | 0.0 | 6.0 | 16.0 | 6.0 | 8.0 | 1.0 |
| SJR_Q_Q1 | 0.0 | 4.0 | 26.0 | 26.0 | 26.0 | 5.0 | 26.0 | 32.0 | 10.0 | 7.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 | 5.0 | 1.0 |
| SJR_Q_Q2 | 1.0 | 3.0 | 3.0 | 3.0 | 3.0 | 16.0 | 23.0 | 14.0 | 12.0 | 6.0 | ... | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 1.0 | 0.0 | 1.0 | 0.0 |
| SJR_Q_Q3 | 5.0 | 5.0 | 1.0 | 1.0 | 1.0 | 6.0 | 30.0 | 34.0 | 18.0 | 6.0 | ... | 0.0 | 3.0 | 0.0 | 1.0 | 0.0 | 2.0 | 3.0 | 0.0 | 1.0 | 0.0 |
| SJR_Q_Q4 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 6.0 | 5.0 | 24.0 | 5.0 | 3.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4.0 | 0.0 | 0.0 | 0.0 |
| SJR_Q_Sin categoria | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 3.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| capitulos | 1.0 | 9.0 | 7.0 | 7.0 | 7.0 | 6.0 | 14.0 | 50.0 | 10.0 | 9.0 | ... | 1.0 | 30.0 | 0.0 | 1.0 | 2.0 | 1.0 | 12.0 | 4.0 | 1.0 | 0.0 |
| innovaciones | 0.0 | 0.0 | 15.0 | 15.0 | 15.0 | 1.0 | 6.0 | 1.0 | 23.0 | 5.0 | ... | 5.0 | 0.0 | 12.0 | 0.0 | 9.0 | 0.0 | 1.0 | 2.0 | 0.0 | 0.0 |
| libros | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | ... | 0.0 | 4.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| softwares | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 3.0 | 3.0 | 0.0 | 5.0 | ... | 12.0 | 0.0 | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 |
| trabajos_grado | 38.0 | 54.0 | 5.0 | 5.0 | 5.0 | 107.0 | 119.0 | 73.0 | 154.0 | 132.0 | ... | 320.0 | 9.0 | 39.0 | 0.0 | 31.0 | 34.0 | 33.0 | 19.0 | 18.0 | 0.0 |
| integrantes | 47.0 | 24.0 | 6.0 | 6.0 | 6.0 | 49.0 | 68.0 | 96.0 | 104.0 | 38.0 | ... | 23.0 | 0.0 | 21.0 | 17.0 | 0.0 | 0.0 | 7.0 | 6.0 | 0.0 | 4.0 |
| doctorado | 16.0 | 7.0 | 4.0 | 4.0 | 4.0 | 6.0 | 23.0 | 20.0 | 21.0 | 14.0 | ... | 3.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 2.0 | 0.0 | 0.0 | 1.0 |
| Especializacion | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 4.0 | 3.0 | 1.0 | 2.0 | ... | 1.0 | 0.0 | 0.0 | 6.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| maestria | 15.0 | 13.0 | 0.0 | 0.0 | 0.0 | 8.0 | 24.0 | 43.0 | 29.0 | 9.0 | ... | 16.0 | 0.0 | 9.0 | 4.0 | 0.0 | 0.0 | 4.0 | 5.0 | 0.0 | 3.0 |
| pregrado | 10.0 | 1.0 | 1.0 | 1.0 | 1.0 | 13.0 | 10.0 | 18.0 | 41.0 | 12.0 | ... | 2.0 | 0.0 | 2.0 | 2.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 |
| Investigador_Asociado | 4.0 | 1.0 | 1.0 | 1.0 | 1.0 | 0.0 | 3.0 | 4.0 | 4.0 | 4.0 | ... | 2.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| Investigador_Emerito | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
| Investigador_Junior | 7.0 | 1.0 | 3.0 | 3.0 | 3.0 | 1.0 | 11.0 | 16.0 | 2.0 | 7.0 | ... | 1.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 |
| Investigador Senior | 0.0 | 1.0 | 0.0 | 0.0 | 0.0 | 1.0 | 6.0 | 1.0 | 0.0 | 1.0 | ... | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
33 rows × 7891 columns
dfg.filter(items=['Instituciones', 'Nombre grupo'])
| Instituciones | Nombre grupo | |
|---|---|---|
| 0 | Universidad De Pamplona Avalado | Biotecnologia vegetal |
| 1 | Pontificia Universidad Javeriana Avalado | Grupo de investigación en agricultura biológica |
| 2 | Corporación Corpogen No Avalado | Rg microbial ecology: metabolism, genomics & e... |
| 3 | Asociacion Fundacion De Investigacion Microbio... | Rg microbial ecology: metabolism, genomics & e... |
| 4 | Compañia Campo Colombia Avalado | Rg microbial ecology: metabolism, genomics & e... |
| ... | ... | ... |
| 7886 | Universidad Francisco De Paula Santander Ocaña... | Grupo de investigación socio jurídico - gisoju |
| 7887 | Universitaria Agustiniana Avalado | Parrhesía, grupo de investigación en filosofía... |
| 7888 | Corporacion Universitaria Rafael Nuñez Avalado | Trabajo social, derechos humanos y desarrollo ... |
| 7889 | Organizacion De Estados Iberoamericanos Oei Av... | Investigación e innovación para la educación, ... |
| 7890 | Colegio Mayor Nuestra Señora Del Rosario Avalado | Grupo de estudios creativos de la universidad ... |
7891 rows × 2 columns
dfgi = dfg['Instituciones'].value_counts()
dfgi
Universidad Nacional De Colombia Avalado 621
Universidad De Antioquia Avalado 262
Universidad Del Valle Avalado 190
Universidad De Los Andes Avalado 159
Universidad Pedagógica Y Tecnológica De Colombia Avalado 155
...
SL Avalado 1
Hospital Universitario De La Samaritana - H.U.S. No Avalado 1
Asociación De Profesionales En Administración Pública, Municipal Y Regional - Aspapmur No Avalado 1
Cadena Productiva De Plantas Medicinales Y Aromáticas Del Departamento De Risaralda No Avalado 1
Organizacion De Estados Iberoamericanos Oei Avalado 1
Name: Instituciones, Length: 1442, dtype: int64
dfgi.head(10)
Universidad Nacional De Colombia Avalado 621 Universidad De Antioquia Avalado 262 Universidad Del Valle Avalado 190 Universidad De Los Andes Avalado 159 Universidad Pedagógica Y Tecnológica De Colombia Avalado 155 Universidad Distrital Francisco José De Caldas Avalado 124 Universidad Tecnológica De Pereira Avalado 117 Pontificia Universidad Javeriana Avalado 112 Universidad De Cartagena Avalado 99 Servicio Nacional De Aprendizaje Sena Avalado 97 Name: Instituciones, dtype: int64
dfgi=dfgi.head(10)
plot = dfgi.plot.pie(y='grupo', figsize=(5, 5))